
pip install docx2txt

from langchain.document_loaders import UnstructuredPowerPointLoader
from langchain.document_loaders import UnstructuredExcelLoader

from langchain.document_loaders import UnstructuredPowerPointLoader
from langchain.document_loaders import Docx2txtLoader
from langchain.document_loaders.csv_loader import CSVLoader

# https://python.langchain.com/docs/integrations/document_loaders/csv


loader = UnstructuredPowerPointLoader("example_data/fake-power-point.pptx")
data = loader.load()




loader = Docx2txtLoader("example_data/fake.docx")
data = loader.load()



loader = UnstructuredExcelLoader("example_data/stanley-cups.xlsx", mode="elements")
docs = loader.load()
docs[0]



loader = CSVLoader(file_path="./example_data/mlb_teams_2012.csv")

data = loader.load()